C5_blackjack
1 | import numpy as np |
C6_TD
1 | import gym |
C9_semiGTD
1 | # 绘制位置和速度图像 |
C9_tile_coding
1 | #!/usr/bin/env python |
C13_AC
朴素AC(TD自举)
1 | import gym |
朴素AC(monte carlo)
1 | import gym |
C13_PG
REFORCE (on policy版)
1 | import gym |
REFORCE (off policy版)
1 | import gym |